// The class that encapsulates the data parsed from XML document
public class XMLData
{
	public final static String SPLIT_TOKENS = "[!\"#$%&'()*+,./:;<=>?\\[\\]^`{|}~\\s]";

	public String header;
	public String text;
	public String docID;

	public XMLData()
	{
		header = "";
		docID = "";
		text = "";
	}

	public XMLData(String docID, String header, String text)
	{
		this.docID = docID;
		this.header = header;
		this.text = text;
	}

	// Returns the array of string contained in the text (split using SPLIT_TOKEN)
	public String[] splitText()
	{
		return text.split(SPLIT_TOKENS);
	}
}
